
<head>
    <meta http-equiv="content-type" content="text/html; charset=utf-8" />
    <meta name="author" content="duchanh" />
    <title>Crawl</title>
</head>
<?php
 
include('crawl.class.php');
 
$link = 'http://thethao.vnexpress.net/tin-tuc/sea-games-27/tuyen-nu-viet-nam-thang-tung-bung-ngay-ra-quan-2923453.html';
 
$H_Crawl = new H_Crawl();
// xoa het cac the javascript va nhung the co class=".thumblock" di
$H_Crawl->arr_att_clean  = array('script','.thumblock');
 
// lay title bai viet
$title = $H_Crawl->getTitle($link, 'div.title_news h1');
 
// lay noi dung bai viet
$content = $H_Crawl->getTitle($link, 'div.fck_detail');
 
// xoa het cac link trong phan noi dung di
$content = $H_Crawl->removeLink($content);
 

var_export($content);
?>
<body>
</body>
</html>